@book{abu2012learning,
	title        = {Learning from data},
	author       = {Abu-Mostafa, Yaser S and Magdon-Ismail, Malik and Lin, Hsuan-Tien},
	year         = 2012,
	publisher    = {AMLBook New York},
	volume       = 4
}
@misc{altay_2020,
	title        = {Categorical variables in decision trees},
	author       = {Altay, Gabriel},
	year         = 2020,
	month        = {Mar},
	journal      = {Kaggle},
	publisher    = {Kaggle},
	url          = {https://www.kaggle.com/code/gabrielaltay/categorical-variables-in-decision-trees}
}
@book{arpaci2018operating,
  title={Operating systems: Three easy pieces},
  author={Arpaci-Dusseau, Remzi H and Arpaci-Dusseau, Andrea C},
  year={2018},
  publisher={Arpaci-Dusseau Books, LLC}
}

@inproceedings{arapakis2014impact,
	title        = {Impact of response latency on user behavior in web search},
	author       = {Arapakis, Ioannis and Bai, Xiao and Cambazoglu, B Barla},
	year         = 2014,
	booktitle    = {Proceedings of the 37th international ACM SIGIR conference on Research \& development in information retrieval},
	pages        = {103--112}
}
@article{cong2016novel,
  title={A novel alignment-free method for detection of lateral genetic transfer based on TF-IDF},
  author={Cong, Yingnan and Chan, Yao-ban and Ragan, Mark A},
  journal={Scientific reports},
  volume={6},
  number={1},
  pages={1--13},
  year={2016},
  publisher={Springer}
}
@article{bengio2013representation,
  title={Representation learning: A review and new perspectives},
  author={Bengio, Yoshua and Courville, Aaron and Vincent, Pascal},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={35},
  number={8},
  pages={1798--1828},
  year={2013},
  publisher={IEEE}
}

@article{gabin2023keyword,
  title={Keyword Embeddings for Query Suggestion},
  author={Gab{\'\i}n, Jorge and Ares, M Eduardo and Parapar, Javier},
  journal={arXiv preprint arXiv:2301.08006},
  year={2023}
}

@article{castells2023recommender,
	title        = {Recommender Systems: A Primer},
	author       = {Castells, Pablo and Jannach, Dietmar},
	year         = 2023,
	journal      = {arXiv preprint arXiv:2302.02579}
}
@article{chandrasekaran2021evolution,
	title        = {Evolution of semantic similarity—a survey},
	author       = {Chandrasekaran, Dhivya and Mago, Vijay},
	year         = 2021,
	journal      = {ACM Computing Surveys (CSUR)},
	publisher    = {ACM New York, NY, USA},
	volume       = 54,
	number       = 2,
	pages        = {1--37}
}
@inproceedings{cheng2016wide,
  title={Wide \& deep learning for recommender systems},
  author={Cheng, Heng-Tze and Koc, Levent and Harmsen, Jeremiah and Shaked, Tal and Chandra, Tushar and Aradhye, Hrishi and Anderson, Glen and Corrado, Greg and Chai, Wei and Ispir, Mustafa and others},
  booktitle={Proceedings of the 1st workshop on deep learning for recommender systems},
  pages={7--10},
  year={2016}
}
@book{chollet2021deep,
	title        = {Deep learning with Python},
	author       = {Chollet, Francois},
	year         = 2021,
	publisher    = {Simon and Schuster}
}
@inproceedings{collobert2008unified,
  title={A unified architecture for natural language processing: Deep neural networks with multitask learning},
  author={Collobert, Ronan and Weston, Jason},
  booktitle={Proceedings of the 25th international conference on Machine learning},
  pages={160--167},
  year={2008}
}
@inproceedings{covington2016deep,
	title        = {Deep neural networks for youtube recommendations},
	author       = {Covington, Paul and Adams, Jay and Sargin, Emre},
	year         = 2016,
	booktitle    = {Proceedings of the 10th ACM conference on recommender systems},
	pages        = {191--198}
}
@inproceedings{cvitanic2016lda,
	title        = {LDA v. LSA: A comparison of two computational text analysis tools for the functional categorization of patents},
	author       = {Cvitanic, Toni and Lee, Bumsoo and Song, Hyeon Ik and Fu, Katherine and Rosen, David},
	year         = 2016,
	booktitle    = {International Conference on Case-Based Reasoning}
}
@article{devlin2018bert,
  title={Bert: Pre-training of deep bidirectional transformers for language understanding},
  author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
  journal={arXiv preprint arXiv:1810.04805},
  year={2018}
}
@article{di2021considerations,
  title={Considerations about learning Word2Vec},
  author={Di Gennaro, Giovanni and Buonanno, Amedeo and Palmieri, Francesco AN},
  journal={The Journal of Supercomputing},
  pages={1--16},
  year={2021},
  publisher={Springer}
}
@misc{doctorow_2023,
	title        = {Pluralistic: Tiktok's enshittification (21 Jan 2023)},
	author       = {Doctorow, Author  Cory},
	year         = 2023,
	month        = {Feb},
	journal      = {Pluralistic Daily links from Cory Doctorow},
	url          = {https://pluralistic.net/2023/01/21/potemkin-ai/#hey-guys}
}
@misc{dye_ekandham_saluja_rastogi_2020,
	title        = {Supporting content decision makers with machine learning},
	author       = {Dye, Melody and Ekandham, Chaitanya and Saluja, Avneesh and Rastogi, Ashish},
	year         = 2020,
	month        = {Dec},
	url          = {https://netflixtechblog.com/supporting-content-decision-makers-with-machine-learning-995b7b76006f}
}
@article{ekstrand2019recommender,
	title        = {Recommender systems notation: proposed common notation for teaching and research},
	author       = {Ekstrand, Michael D and Konstan, Joseph A},
	year         = 2019,
	journal      = {arXiv preprint arXiv:1902.01348}
}
@inproceedings{el2022twhin,
  title={Twhin: Embedding the twitter heterogeneous information network for personalized recommendation},
  author={El-Kishky, Ahmed and Markovich, Thomas and Park, Serim and Verma, Chetan and Kim, Baekjin and Eskander, Ramy and Malkov, Yury and Portman, Frank and Samaniego, Sof{\'\i}a and Xiao, Ying and others},
  booktitle={Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining},
  pages={2842--2850},
  year={2022}
}
@inproceedings{flach2013reducing,
  title={Reducing web latency: the virtue of gentle aggression},
  author={Flach, Tobias and Dukkipati, Nandita and Terzis, Andreas and Raghavan, Barath and Cardwell, Neal and Cheng, Yuchung and Jain, Ankur and Hao, Shuai and Katz-Bassett, Ethan and Govindan, Ramesh},
  booktitle={Proceedings of the ACM SIGCOMM 2013 conference on SIGCOMM},
  pages={159--170},
  year={2013}
}
@book{fowler2012patterns,
  title={Patterns of Enterprise Application Architecture: Pattern Enterpr Applica Arch},
  author={Fowler, Martin},
  year={2012},
  publisher={Addison-Wesley}
}

@article{gerbrands1981relationships,
	title        = {On the relationships between SVD, KLT and PCA},
	author       = {Gerbrands, Jan J},
	year         = 1981,
	journal      = {Pattern recognition},
	publisher    = {Elsevier},
	volume       = 14,
	number       = {1-6},
	pages        = {375--381}
}
@article{goldberg1992using,
	title        = {Using collaborative filtering to weave an information tapestry},
	author       = {Goldberg, David and Nichols, David and Oki, Brian M and Terry, Douglas},
	year         = 1992,
	journal      = {Communications of the ACM},
	publisher    = {ACM New York, NY, USA},
	volume       = 35,
	number       = 12,
	pages        = {61--70}
}
@article{goldberg2014word2vec,
  title={word2vec Explained: deriving Mikolov et al.'s negative-sampling word-embedding method},
  author={Goldberg, Yoav and Levy, Omer},
  journal={arXiv preprint arXiv:1402.3722},
  year={2014}
}
@article{goldberg2017neural,
  title={Neural network methods for natural language processing},
  author={Goldberg, Yoav},
  journal={Synthesis lectures on human language technologies},
  volume={10},
  number={1},
  pages={1--309},
  year={2017},
  publisher={Morgan \& Claypool Publishers}
}
@inproceedings{gomez2022learning,
  title={Learning Users’ Preferred Visual Styles in an Image Marketplace},
  author={Gomez Bruballa, Raul and Burnham-King, Lauren and Sala, Alessandra},
  booktitle={Proceedings of the 16th ACM Conference on Recommender Systems},
  pages={466--468},
  year={2022}
}
@book{gregg2014systems,
	title        = {Systems performance: enterprise and the cloud},
	author       = {Gregg, Brendan},
	year         = 2014,
	publisher    = {Pearson Education}
}
@inproceedings{grbovic2018real,
  title={Real-time personalization using embeddings for search ranking at airbnb},
  author={Grbovic, Mihajlo and Cheng, Haibin},
  booktitle={Proceedings of the 24th ACM SIGKDD international conference on knowledge discovery \& data mining},
  pages={311--320},
  year={2018}
}

@inproceedings{hansen2020contextual,
	title        = {Contextual and sequential user embeddings for large-scale music recommendation},
	author       = {Hansen, Casper and Hansen, Christian and Maystre, Lucas and Mehrotra, Rishabh and Brost, Brian and Tomasi, Federico and Lalmas, Mounia},
	year         = 2020,
	booktitle    = {Proceedings of the 14th ACM Conference on Recommender Systems},
	pages        = {53--62}
}
@inproceedings{he2017neural,
  title={Neural collaborative filtering},
  author={He, Xiangnan and Liao, Lizi and Zhang, Hanwang and Nie, Liqiang and Hu, Xia and Chua, Tat-Seng},
  booktitle={Proceedings of the 26th international conference on world wide web},
  pages={173--182},
  year={2017}
}
@article{hooker2021hardware,
  title={The hardware lottery},
  author={Hooker, Sara},
  journal={Communications of the ACM},
  volume={64},
  number={12},
  pages={58--65},
  year={2021},
  publisher={ACM New York, NY, USA}
}
@inproceedings{hong2011predicting,
  title={Predicting popular messages in twitter},
  author={Hong, Liangjie and Dan, Ovidiu and Davison, Brian D},
  booktitle={Proceedings of the 20th international conference companion on World wide web},
  pages={57--58},
  year={2011}
}
@inproceedings{houle2010can,
	title        = {Can shared-neighbor distances defeat the curse of dimensionality?},
	author       = {Houle, Michael E and Kriegel, Hans-Peter and Kr{\"o}ger, Peer and Schubert, Erich and Zimek, Arthur},
	year         = 2010,
	booktitle    = {Scientific and Statistical Database Management: 22nd International Conference, SSDBM 2010, Heidelberg, Germany, June 30--July 2, 2010. Proceedings 22},
	pages        = {482--500},
	organization = {Springer}
}
@book{jannach2010recommender,
	title        = {Recommender systems: an introduction},
	author       = {Jannach, Dietmar and Zanker, Markus and Felfernig, Alexander and Friedrich, Gerhard},
	year         = 2010,
	publisher    = {Cambridge University Press}
}
@inproceedings{jing2015visual,
	title        = {Visual search at pinterest},
	author       = {Jing, Yushi and Liu, David and Kislyuk, Dmitry and Zhai, Andrew and Xu, Jiajing and Donahue, Jeff and Tavel, Sarah},
	year         = 2015,
	booktitle    = {Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining},
	pages        = {1889--1898}
}
@inproceedings{joachims2005text,
  title={Text categorization with support vector machines: Learning with many relevant features},
  author={Joachims, Thorsten},
  booktitle={Machine Learning: ECML-98: 10th European Conference on Machine Learning Chemnitz, Germany, April 21--23, 1998 Proceedings},
  pages={137--142},
  year={2005},
  organization={Springer}
}

@misc{karpathy_2015,
	title        = {The Unreasonable Effectiveness of Recurrent Neural Networks},
	author       = {Karpathy, Andrej},
	year         = 2015,
	month        = {May},
	journal      = {The unreasonable effectiveness of recurrent neural networks},
	url          = {https://karpathy.github.io/2015/05/21/rnn-effectiveness/}
}
@book{klein2013coding,
  title={Coding the Matrix: Linear Algebra Through Applications to Computer Science},
  author={Klein, P.N.},
  isbn={9780615880990},
  url={https://books.google.com/books?id=3AA4nwEACAAJ},
  year={2013},
  publisher={Newtonian Press}
}
@book{kleppmann2017designing,
  title={Designing data-intensive applications: The big ideas behind reliable, scalable, and maintainable systems},
  author={Kleppmann, Martin},
  year={2017},
  publisher={" O'Reilly Media, Inc."}
}
@article{kvernadze2022two,
  title={Two Is Better Than One: Dual Embeddings for Complementary Product Recommendations},
  author={Kvernadze, Giorgi and Sudyanti, Putu Ayu G and Subedi, Nishan and Hajiaghayi, Mohammad},
  journal={arXiv preprint arXiv:2211.14982},
  year={2022}
}
@book{kreps2014heart,
	title        = {I heart logs: Event data, stream processing, and data integration},
	author       = {Kreps, Jay},
	year         = 2014,
	publisher    = {" O'Reilly Media, Inc."}
}
@article{kreuzberger2022machine,
  title={Machine learning operations (mlops): Overview, definition, and architecture},
  author={Kreuzberger, Dominik and K{\"u}hl, Niklas and Hirschl, Sebastian},
  journal={arXiv preprint arXiv:2205.02302},
  year={2022}
}
@book{lakshmanan2020machine,
	title        = {Machine learning design patterns},
	author       = {Lakshmanan, Valliappa and Robinson, Sara and Munn, Michael},
	year         = 2020,
	publisher    = {O'Reilly Media}
}
@article{lecun1998gradient,
  title={Gradient-based learning applied to document recognition},
  author={LeCun, Yann and Bottou, L{\'e}on and Bengio, Yoshua and Haffner, Patrick},
  journal={Proceedings of the IEEE},
  volume={86},
  number={11},
  pages={2278--2324},
  year={1998},
  publisher={Ieee}
}
@article{lecun2015deep,
  title={Deep learning. nature, 521 (7553), 436-444},
  author={LeCun, Yann and Bengio, Yoshua and Hinton, Geoffrey and others},
  journal={Google Scholar Google Scholar Cross Ref Cross Ref},
  pages={25},
  year={2015}
}
@book{leskovec2020mining,
  title={Mining of massive data sets},
  author={Leskovec, Jure and Rajaraman, Anand and Ullman, Jeffrey David},
  year={2020},
  publisher={Cambridge university press}
}

@article{levy2014neural,
  title={Neural word embedding as implicit matrix factorization},
  author={Levy, Omer and Goldberg, Yoav},
  journal={Advances in neural information processing systems},
  volume={27},
  year={2014}
}
@inproceedings{liu2022twice,
  title={Twice-Twitter Content Embeddings},
  author={Liu, Xianjing and Golshan, Behzad and Leung, Kenny and Saini, Aman and Kulkarni, Vivek and Mollahosseini, Ali and Mo, Jeff},
  booktitle    = {CIKM 2022},
  year={2022}
}
@inproceedings{lv2011documents,
	title        = {When documents are very long, bm25 fails!},
	author       = {Lv, Yuanhua and Zhai, ChengXiang},
	year         = 2011,
	booktitle    = {Proceedings of the 34th international ACM SIGIR conference on Research and development in Information Retrieval},
	pages        = {1103--1104}
}
@book{meadows2008thinking,
  title={Thinking in systems: A primer},
  author={Meadows, Donella H},
  year={2008},
  publisher={chelsea green publishing}
}
@article{meil2023ai,
  title={AI in the Enterprise},
  author={Meil, Doug},
  journal={Communications of the ACM},
  volume={66},
  number={6},
  pages={6--7},
  year={2023},
  publisher={ACM New York, NY, USA}
}
@article{mikolov2013efficient,
	title        = {Efficient estimation of word representations in vector space},
	author       = {Mikolov, Tomas and Chen, Kai and Corrado, Greg and Dean, Jeffrey},
	year         = 2013,
	journal      = {arXiv preprint arXiv:1301.3781}
}
@article{naseem2021comprehensive,
  title={A comprehensive survey on word representation models: From classical to state-of-the-art word representation language models},
  author={Naseem, Usman and Razzak, Imran and Khan, Shah Khalid and Prasad, Mukesh},
  journal={Transactions on Asian and Low-Resource Language Information Processing},
  volume={20},
  number={5},
  pages={1--35},
  year={2021},
  publisher={ACM New York, NY}
}
@article{oancea2014gpgpu,
  title={Gpgpu computing},
  author={Oancea, Bogdan and Andrei, Tudorel and Dragoescu, Raluca Mariana},
  journal={arXiv preprint arXiv:1408.6923},
  year={2014}
}
@inproceedings{pal2020pinnersage,
  title={Pinnersage: Multi-modal user embedding framework for recommendations at pinterest},
  author={Pal, Aditya and Eksombatchai, Chantat and Zhou, Yitong and Zhao, Bo and Rosenberg, Charles and Leskovec, Jure},
  booktitle={Proceedings of the 26th ACM SIGKDD International Conference on Knowledge Discovery \& Data Mining},
  pages={2311--2320},
  year={2020}
}
@book{rao2019natural,
  title={Natural language processing with PyTorch: build intelligent language applications using deep learning},
  author={Rao, Delip and McMahan, Brian},
  year={2019},
  publisher={" O'Reilly Media, Inc."}
}
@article{raschka2018model,
  title={Model evaluation, model selection, and algorithm selection in machine learning},
  author={Raschka, Sebastian},
  journal={arXiv preprint arXiv:1811.12808},
  year={2018}
}
@inproceedings{rendle2020neural,
  title={Neural collaborative filtering vs. matrix factorization revisited},
  author={Rendle, Steffen and Krichene, Walid and Zhang, Li and Anderson, John},
  booktitle={Proceedings of the 14th ACM Conference on Recommender Systems},
  pages={240--248},
  year={2020}
}
@article{rumelhart1986learning,
  title={Learning representations by back-propagating errors},
  author={Rumelhart, David E and Hinton, Geoffrey E and Williams, Ronald J},
  journal={nature},
  volume={323},
  number={6088},
  pages={533--536},
  year={1986},
  publisher={Nature Publishing Group UK London}
}
@article{russakovsky2015imagenet,
  title={Imagenet large scale visual recognition challenge},
  author={Russakovsky, Olga and Deng, Jia and Su, Hao and Krause, Jonathan and Satheesh, Sanjeev and Ma, Sean and Huang, Zhiheng and Karpathy, Andrej and Khosla, Aditya and Bernstein, Michael and others},
  journal={International journal of computer vision},
  volume={115},
  pages={211--252},
  year={2015},
  publisher={Springer}
}
@inproceedings{rush2018annotated,
  title={The annotated transformer},
  author={Rush, Alexander M},
  booktitle={Proceedings of workshop for NLP open source software (NLP-OSS)},
  pages={52--60},
  year={2018}
}
@book{schutze2008introduction,
	title        = {Introduction to information retrieval},
	author       = {Sch{\"u}tze, Hinrich and Manning, Christopher D and Raghavan, Prabhakar},
	year         = 2008,
	publisher    = {Cambridge University Press Cambridge},
	volume       = 39
}
@misc{sculley2014machine,
  title={Machine learning: The high interest credit card of technical debt.(2014)},
  author={Sculley, David and Holt, Gary and Golovin, Daniel and Davydov, Eugene and Phillips, Todd and Ebner, Dietmar and Chaudhary, Vinay and Young, Michael},
  year={2014}
}
@book{seaver2022computing,
	title        = {Computing Taste: Algorithms and the Makers of Music Recommendation},
	author       = {Seaver, Nick},
	year         = 2022,
	publisher    = {University of Chicago Press}
}
@misc{Shabani_2023, title={How to train your own large language models}, url={https://blog.replit.com/llm-training}, journal={Replit Blog}, publisher={Replit}, author={Shabani, Reza}, year={2023}, month={Apr}} 
@article{sharir2020cost,
  title={The cost of training nlp models: A concise overview},
  author={Sharir, Or and Peleg, Barak and Shoham, Yoav},
  journal={arXiv preprint arXiv:2004.08900},
  year={2020}
}
@article{shallue2018measuring,
  title={Measuring the effects of data parallelism on neural network training},
  author={Shallue, Christopher J and Lee, Jaehoon and Antognini, Joseph and Sohl-Dickstein, Jascha and Frostig, Roy and Dahl, George E},
  journal={arXiv preprint arXiv:1811.03600},
  year={2018}
}
@article{shiebler2010making,
  title={Making machine learning easy with embeddings},
  author={Shiebler, Dan and Tayal, Abhishek},
  journal={SysML http://www.sysml.cc/doc/115.pdf},
  year={2010}
}
@article{simhi2022interpreting,
  title={Interpreting Embedding Spaces by Conceptualization},
  author={Simhi, Adi and Markovitch, Shaul},
  journal={arXiv preprint arXiv:2209.00445},
  year={2022}
}
@article{steck2021deep,
	title        = {Deep learning for recommender systems: A Netflix case study},
	author       = {Steck, Harald and Baltrunas, Linas and Elahi, Ehtsham and Liang, Dawen and Raimond, Yves and Basilico, Justin},
	year         = 2021,
	journal      = {AI Magazine},
	volume       = 42,
	number       = 3,
	pages        = {7--18}
}
@book{stevens2020deep,
	title        = {Deep learning with PyTorch},
	author       = {Stevens, Eli and Antiga, Luca and Viehmann, Thomas},
	year         = 2020,
	publisher    = {Manning Publications}
}
@inproceedings{svore2009machine,
	title        = {A machine learning approach for improved BM25 retrieval},
	author       = {Svore, Krysta M and Burges, Christopher JC},
	year         = 2009,
	booktitle    = {Proceedings of the 18th ACM conference on Information and knowledge management},
	pages        = {1811--1814}
}
@book{tunstall2022natural,
  title={Natural language processing with transformers},
  author={Tunstall, Lewis and Von Werra, Leandro and Wolf, Thomas},
  year={2022},
  publisher={" O'Reilly Media, Inc."}
}
@inproceedings{ying2018graph,
  title={Graph convolutional neural networks for web-scale recommender systems},
  author={Ying, Rex and He, Ruining and Chen, Kaifeng and Eksombatchai, Pong and Hamilton, William L and Leskovec, Jure},
  booktitle={Proceedings of the 24th ACM SIGKDD international conference on knowledge discovery \& data mining},
  pages={974--983},
  year={2018}
}
@article{vaswani2017attention,
	title        = {Attention is all you need},
	author       = {Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, {\L}ukasz and Polosukhin, Illia},
	year         = 2017,
	journal      = {Advances in neural information processing systems},
	volume       = 30
}
@article{Wang2020FromST,
  title={From static to dynamic word representations: a survey},
  author={Yuxuan Wang and Yutai Hou and Wanxiang Che and Ting Liu},
  journal={International Journal of Machine Learning and Cybernetics},
  year={2020},
  volume={11},
  pages={1611-1630}
}
@article{wang2019evaluating,
  title={Evaluating word embedding models: Methods and experimental results},
  author={Wang, Bin and Wang, Angela and Chen, Fenxiao and Wang, Yuncheng and Kuo, C-C Jay},
  journal={APSIPA transactions on signal and information processing},
  volume={8},
  pages={e19},
  year={2019},
  publisher={Cambridge University Press}
}

@article{wewer2021updating,
  title={Updating embeddings for dynamic knowledge graphs},
  author={Wewer, Christopher and Lemmerich, Florian and Cochez, Michael},
  journal={arXiv preprint arXiv:2109.10896},
  year={2021}
}
@article{wu2023bloomberggpt,
  title={Bloomberggpt: A large language model for finance},
  author={Wu, Shijie and Irsoy, Ozan and Lu, Steven and Dabravolski, Vadim and Dredze, Mark and Gehrmann, Sebastian and Kambadur, Prabhanjan and Rosenberg, David and Mann, Gideon},
  journal={arXiv preprint arXiv:2303.17564},
  year={2023}
}
@article{xu2023multimodal,
  title={Multimodal learning with transformers: A survey},
  author={Xu, Peng and Zhu, Xiatian and Clifton, David A},
  journal={IEEE Transactions on Pattern Analysis and Machine Intelligence},
  year={2023},
  publisher={IEEE}
}

@article{zhang2019deep,
  title={Deep learning based recommender system: A survey and new perspectives},
  author={Zhang, Shuai and Yao, Lina and Sun, Aixin and Tay, Yi},
  journal={ACM computing surveys (CSUR)},
  volume={52},
  number={1},
  pages={1--38},
  year={2019},
  publisher={ACM New York, NY, USA}
}
@article{zhang2020revisiting,
  title={Revisiting few-sample BERT fine-tuning},
  author={Zhang, Tianyi and Wu, Felix and Katiyar, Arzoo and Weinberger, Kilian Q and Artzi, Yoav},
  journal={arXiv preprint arXiv:2006.05987},
  year={2020}
}
@article{zheng2017multi,
	title        = {Multi-stakeholder recommendation: Applications and challenges},
	author       = {Zheng, Yong},
	year         = 2017,
	journal      = {arXiv preprint arXiv:1707.08913}
}
@article{zinkevich2017rules,
	title        = {Rules of machine learning: Best practices for ML engineering},
	author       = {Zinkevich, Martin},
	year         = 2017,
	journal      = {URL: https://developers. google. com/machine-learning/guides/rules-of-ml}
}
